library(tidyverse)
[30m── [1mAttaching packages[22m ───────────────────────────────────────────────────────────────────────────────────────── tidyverse 1.2.1 ──[39m
[30m[32m✔[30m [34mggplot2[30m 3.0.0 [32m✔[30m [34mpurrr [30m 0.2.5
[32m✔[30m [34mtibble [30m 1.4.2 [32m✔[30m [34mdplyr [30m 0.7.6
[32m✔[30m [34mtidyr [30m 0.8.1 [32m✔[30m [34mstringr[30m 1.3.1
[32m✔[30m [34mreadr [30m 1.1.1 [32m✔[30m [34mforcats[30m 0.3.0[39m
[30m── [1mConflicts[22m ──────────────────────────────────────────────────────────────────────────────────────────── tidyverse_conflicts() ──
[31m✖[30m [34mdplyr[30m::[32mfilter()[30m masks [34mstats[30m::filter()
[31m✖[30m [34mdplyr[30m::[32mlag()[30m masks [34mstats[30m::lag()[39m
library(lubridate)
Attaching package: ‘lubridate’
The following object is masked from ‘package:base’:
date
dt_issues = read.csv("data/issues_data.csv", header=TRUE)
dt_star = read.csv("data/stargazers.csv", header=TRUE)
dt_user = read.csv("data/users_data.csv", header=TRUE)
# Inspect the dataset by taking the first 10 rows of each dataset.
dt_issues %>% head(10)
dt_star %>% head(10)
dt_user %>% head(10)
# User dataset cleaning
# Cleaning
dt_user_cld <- dt_user %>%
# Drop unused features.
select(-X_id, -avatar_url, -events_url, -followers_url, -following_url,
-gists_url, -gravatar_id, -html_url, -node_id, -public_gists, -received_events_url,
-repos_url, -site_admin, -starred_url, -subscriptions_url, -type) %>%
# Convert the time/date features to relative format.
mutate(created_at = lubridate::ymd_hms(created_at),
updated_at = lubridate::ymd_hms(updated_at)) %>%
# Convert various factor type features to string type.
mutate(bio = as.character(bio),
blog = as.character(blog),
company = as.character(company),
email = as.character(email),
location = as.character(location),
login = as.character(login),
name = as.character(name),
organizations_url = as.character(organizations_url),
url = as.character(url))
str(dt_user_cld)
'data.frame': 39987 obs. of 16 variables:
$ bio : chr "" "" "" "" ...
$ blog : chr "" "" "" "" ...
$ company : chr "" "" "" "" ...
$ created_at : POSIXct, format: "2016-07-12 05:17:50" "2016-08-27 14:04:23" "2015-06-19 13:57:11" "2017-01-14 03:30:31" ...
$ email : chr "" "mytempbh@outlook.com" "n1085633848@outlook.com" "" ...
$ followers : int 9 4 7 2 0 2 13 5 1 0 ...
$ following : int 16 38 14 89 0 0 21 126 48 1 ...
$ hireable : Factor w/ 2 levels "","True": 1 1 1 1 1 1 1 1 1 1 ...
$ id : int 20412837 21278892 12967679 25113799 34975530 16221698 17765748 19787172 20368646 16677599 ...
$ location : chr "" "" "" "" ...
$ login : chr "moloach" "bhxch" "YueNing" "BigFaceCatMhc" ...
$ name : chr "" "Zhe Lee" "naodongbanana" "" ...
$ organizations_url: chr "https://api.github.com/users/moloach/orgs" "https://api.github.com/users/bhxch/orgs" "https://api.github.com/users/YueNing/orgs" "https://api.github.com/users/BigFaceCatMhc/orgs" ...
$ public_repos : int 10 34 29 4 0 26 93 102 13 2 ...
$ updated_at : POSIXct, format: "2019-03-09 00:15:05" "2019-03-09 09:30:45" "2019-03-25 10:50:50" "2019-03-28 00:02:38" ...
$ url : chr "https://api.github.com/users/moloach" "https://api.github.com/users/bhxch" "https://api.github.com/users/YueNing" "https://api.github.com/users/BigFaceCatMhc" ...
company_info <- dt_user_cld %>%
group_by(company) %>%
summarise(count = n()) %>%
arrange(desc(count)) %>%
filter(company != "")
# Display the top companies.
company_info
# Display the company list.
print(company_info$company)
[1] "Tencent" "Baidu" "Alibaba"
[4] "Zhejiang University" "JD" "Tsinghua University"
[7] "baidu" "Shanghai Jiao Tong University" "UESTC"
[10] "Peking University" "Nanjing University" "None"
[13] "null" "SJTU" "none"
[16] "China" "Netease" "@Alibaba"
[19] "BUPT" "USTC" "Wuhan University"
[22] "ZJU" "alibaba" "NetEase"
[25] "ThoughtWorks" "@Tencent" "Fudan University"
[28] "Harbin Institute of Technology" "HUST" "meituan"
[31] "NULL" "Bytedance" "Xidian University"
[34] "百度" "@alibaba" "Alibaba Group"
[37] "Beijing Institute of Technology" "JD.COM" "Alibaba Inc."
[40] "Alipay" "baidu.com" "Beihang University"
[43] "Beijing University of Posts and Telecommunications" "Carnegie Mellon University" "JD.com"
[46] "NJU" "SYSU" "DiDi"
[49] "eleme" "free" "Freelancer"
[52] "Google" "Microsoft" "no"
[55] "South China University of Technology" "tencent" "@bytedance"
[58] "@Microsoft " "@tencent" "Baidu, Inc."
[61] "BIT" "BUAA" "china"
[64] "East China Normal University" "HIT" "Huawei"
[67] "Neusoft" "Southeast University" "Sun Yat-sen University"
[70] "Tongji University" "Xiamen University" "Xiaomi"
[73] "360" "ByteDance" "ECNU"
[76] "Home" "Huazhong University of Science and Technology" "ICT"
[79] "inspur" "Meitu" "Meituan"
[82] "Null" "Qihoo 360" "SCUT"
[85] "Sichuan University" "student" "Student"
[88] "WHU" "xiaomi" "ZTE"
[91] "滴滴出行" "@baidu " "@Meituan-Dianping"
[94] "@Microsoft" "@XiaoMi" "Alibaba Cloud"
[97] "alipay" "Ant Financial" "Beijing Jiaotong University"
[100] "bilibili" "bupt" "Cheetah Mobile"
[103] "CN" "Dalian University of Technology" "Didi"
[106] "IBM" "Intel" "jd"
[109] "jd.com" "LeetCode" "Lenovo"
[112] "Nankai University" "netease" "Oracle"
[115] "ShanghaiTech University" "SUSE" "SUSTech"
[118] "TAL" "THU" "Weibo"
[121] "小红书" "无" "美团点评"
[124] "@Alipay" "@baidu" "@eleme"
[127] "@meituan" "@meituan-dianping" "@Netease"
[130] "@ZangaiFamily " "2dfire" "asiainfo"
[133] "beijing" "Bilibili" "bytedance"
[136] "CASIA" "CETC" "China Telecom"
[139] "Chongqing University" "Columbia University" "CQUPT"
[142] "dianping.com" "Freelance" "GDUT"
[145] "Grab" "HKUST" "iflytek"
[148] "Iflytek" "Inspur" "iqiyi"
[151] "Jilin University" "Kingsoft" "Lianjia"
[154] "MIT" "MTDP" "Nanyang Technological University"
[157] "NCEPU" "NetEase Games" "no company"
[160] "nothing" "NWPU" "NYU"
[163] "personal" "Qiniu" "Qunar"
[166] "SHU" "Sina" "suning"
[169] "Tencent Inc." "Tianjin University" "Tsinghua"
[172] "UCAS" "UCloud" "University of Edinburgh"
[175] "University of Electronic Science and Technology of China" "University of Minnesota" "University of Southern California"
[178] "University of Washington" "unknown" "UW-Madison"
[181] "VIPKID" "Virginia Tech" "ximalaya"
[184] "XMU" "Youzan" "YY Inc."
[187] "zte" "ʕ•̫͡•ʔ-̫͡-ʕ•͓͡•ʔ-̫͡-ʔ" "京东"
[190] "今日头条" "大搜车" "好未来"
[193] "无业游民" "自由职业" "阿里巴巴"
[196] "?" "." "..."
[199] "@" "@alibaba " "@alipay"
[202] "@apache" "@b3log " "@Baidu"
[205] "@banggood" "@bearyinnovative " "@bilibili"
[208] "@Bilibili" "@BISTU" "@chaitin"
[211] "@ctripcorp" "@google" "@iqiyi"
[214] "@justice-code " "@Kyligence " "@Mobike"
[217] "@MobileNowGroup " "@Muxi-Studio" "@myteksi "
[220] "@netease" "@NetEase" "@pingcap "
[223] "@RedrockTeam " "@ruguoapp " "@Seniverse"
[226] "@TalkingData " "@thoughtworks" "@ThoughtWorks"
[229] "@Tradeshift " "@wacai" "@weibocom"
[232] "@xiachufang " "@xiaomi" "@youzan"
[235] "@youzan " "@zaihui" "@zhihu"
[238] "***" "~" "1"
[241] "360企业安全" "a" "Aalto University"
[244] "ABC" "Alauda" "alibaba-inc"
[247] "Alibaba.inc" "Amazon" "arxanfintech"
[250] "Asiainfo" "Atommatrix" "Beijing"
[253] "Beijing Forestry University" "Beijing Normal University" "Beijing,China"
[256] "BISTU" "BJTU" "bonc"
[259] "Booking.com" "Bytedance Inc." "Bytedance.Inc"
[262] "Camera360" "CC" "Central South University"
[265] "China Mobile Communications Corporation" "Chinese Academy of Sciences" "Cisco"
[268] "CMB" "cmcm" "CMU"
[271] "CQU" "creditease" "csust"
[274] "ctrip" "Ctrip" "Ctrip.com"
[277] "Dianping" "didi" "DIDI"
[280] "DLUT" "DotC United Group" "Douban Inc."
[283] "DZH" "eBay" "ele.me"
[286] "ELEME Inc." "elong" "FE"
[289] "Freedom" "freelance" "freelancer"
[292] "Georgetown University" "google" "gyyx"
[295] "GZHU" "Hand" "Hangzhou Dianzi University"
[298] "HDU" "HFUT" "Hohai University"
[301] "home" "Horizon Robotics" "HP"
[304] "https://github.com/eleme" "Huazhong University of Science & Technology" "hundsun"
[307] "hust" "HW" "ICT, CAS"
[310] "Indie Developer" "Infosys" "JNU"
[313] "jumei" "Kingdee" "Kingnet"
[316] "Kwai" "liulishuo" "LLS"
[319] "Magic" "Mars" "Megvii"
[322] "Meili-inc" "meituan.com" "meizu"
[325] "Microsoft Corporation" "mistong" "MOGU"
[328] "Momenta" "N/A" "NaN"
[331] "Nanchang University" "National University of Singapore" "ND"
[334] "NEUQ" "NIO" "No"
[337] "NO" "Northwestern Polytechnical University" "NUAA"
[340] "Open to Opportunities" "oraro" "OSU"
[343] "out of work" "pinduoduo" "pingan"
[346] "PingAn" "PKU" "PPTV"
[349] "PWRD" "Qihoo360" "Qudian"
[352] "Renmin University of China" "RingCentral" "Rutgers"
[355] "saic" "Samsung" "Sankuai"
[358] "school" "SCNU" "SCP Foundation"
[361] "sensetime" "SenseTime" "Shanbay"
[364] "Shandong University" "Shanghai" "Shanghai Jiao Tong Univ."
[367] "Shanghai Jiaotong University" "ShenZhen University" "SiChuan University"
[370] "sina" "SMZDM" "Soochow University"
[373] "souche.com" "South China Normal University" "Splunk"
[376] "Sun Yat-Sen University" "SUT" "SWJTU"
[379] "TalkingData" "TCL" "The Hong Kong Polytechnic University"
[382] "The NetCircle" "Tsinghua university" "TsingHua University"
[385] "ucas" "Uestc" "undefined"
[388] "University of Melbourne" "UNSW" "upyun"
[391] "USTB" "vip.com" "vipkid"
[394] "vipshop" "weixin" "www.iflytek.com"
[397] "wx" "xiaoi.com" "youzan"
[400] "YY.Inc" "Zhejiang University of Technology" "Zhihu"
[403] "Zhihu Inc." "zju" "上海灵娱网络科技"
[406] "中国" "二维火" "保密"
[409] "华为技术有限公司" "同花顺" "小米科技"
[412] "微店" "欢聚时代" "百姓网"
[415] "百度外卖" "重庆邮电大学" " @clustar.ai"
[418] " BaiFenDian Information Technology CO., LTD." " Harbin Institute of Technology, Zhejiang University" " NEC"
[421] " nugget" " TG" " ViceCity @ChillingEffect"
[424] " 上海奕明文化传媒有限公司" " 为中国孱弱的技术, 撑起一片自立自强的天空。" " 众安在线财产保险股份有限公司"
[427] " 无" "-" "--"
[430] "---" ": )" "...."
[433] ".NET" "(╯' - ')╯︵ ┻━┻ " "(주)에어텔닷컴"
[436] "(保密)" "(湖南)大农科技股份有限公司" "[Snriud] Co,ltd"
[439] "{{company}}" "『82.99 F.M』" "@ "
[442] "@ NUAA" "@01org" "@0x8023 "
[445] "@2048li" "@2345" "@24OI"
[448] "@24OI " "@258ch @ApacheCN " "@360"
[451] "@3rdStone @apachecn " "@4paradigm" "@51nb"
[454] "@55haitao" "@75team" "@7moor.com"
[457] "@811Noobs @wenon-dev " "@Accedo-Products " "@acgzone"
[460] "@ACLoong " "@AI" "@aimacity "
[463] "@airbnb " "@AirLoft " "@airteltour "
[466] "@alauda" "@alibaba @kubernetes" "@alibaba @ucweb"
[469] "@Alibaba International UED" "@alibabapictures" "@Alipay @macacajs"
[472] "@aliyun" "@Alkaids " "@alo7 "
[475] "@amazon.com" "@ample-cosplay " "@ampproject "
[478] "@android-plugin " "@AndroidConcentrationCamp" "@ant-design "
[481] "@Aobeef " "@apache " "@apachecn "
[484] "@apoiase" "@apollo-rescue" "@apple "
[487] "@AriadneThread " "@ARM" "@arqamfc"
[490] "@Asiainfo" "@Asuri-Team " "@athm-fe "
[493] "@australiaitgroup " "@AzukiCloud " "@b3log @FangStarNet "
[496] "@BaaSCMIoT" "@Babylonpartners " "@Baoban "
[499] "@BayatGames " "@bendcap" "@BiJie "
[502] "@bilibili " "@Bilibili bilibili" "@BIMK "
[505] "@bingblue " "@biztrology" "@blogs-dev "
[508] "@bmqb @itsCoder " "@bomquote " "@Botpy "
[511] "@breadtrip " "@breakdev " "@brlf-gz "
[514] "@browserstack" "@bupt" "@BUPT"
[517] "@Bytedance" "@ByteDance" "@ByteDance @Muxi-Studio"
[520] "@bytedance-hotsoon" "@bzy-ai " "@cachemoment "
[523] "@CactusBall " "@Caijijijijijiji" "@Canaan-Creative "
[526] "@cba " "@CDEFLS" "@chaitin "
[529] "@CHINA-JD @tiglabs" "@chinacourt" "@chinapexlabs "
[532] "@chinese-poetry " "@CIS2016 " "@CitoryTech "
[535] "@cjfed" "@cloud-ace" "@Cloud4est "
[538] "@cntehang" "@CoconutIslandStudio" "@codeparkhouston"
[541] "@coderemixer " "@Coding " "@computer-lab "
[544] "@coolspan" "@CovenantSQL " "@cqmbr @cqlinkoff @open-data-plan "
[547] "@CR" "@cryptomint" "@CSIRO-enviro-informatics "
[550] "@cumtflyingstudio " "@CVEO Wuhan University " "@Daimler RD/C TI"
[553] "@DanmakuPie " "@DaoCloud" "@DaoCloud "
[556] "@DaoCloud @Apache " "@DeepNorthAI " "@deepwn "
[559] "@defencedriver " "@demlution " "@DGeneAI "
[562] "@disject " "@Dispatchr @ServiceNow" "@dopobo"
[565] "@douban" "@Douban" "@DrPandaLtd "
[568] "@duocloud " "@DXY-F2E " "@easemob "
[571] "@eastern-all-stars" "@EasyHexo " "@ECNU @NVIDIA"
[574] "@eduvo" "@EigenLab" "@EigenLab "
[577] "@ejoy " "@ele.me" "@electron "
[580] "@eleme " "@emqx" "@Ericsson"
[583] "@Eros-Engine" "@exacloud" "@exacloud "
[586] "@ExpediaInc " "@F4ERP" "@Fenlly"
[589] "@flat-dev-ti " "@Forms" "@fox-one "
[592] "@frapsoft " "@Fusemachines" "@fusioncharts"
[595] "@gansutianqi " "@gaoding-inc" "@GeekPark "
[598] "@GitHubProjectsTosotada " "@gmfe" "@gmfe @To-Fun "
[601] "@GNYIO" "@godaddy" "@Golface "
[604] "@Google" "@google " "@goudai-projects "
[607] "@goworks " "@grab" "@Grab"
[610] "@Grab @myteksi " "@growingio" "@guanghetv "
[613] "@Guazi-inc" "@haici" "@haolianluo "
[616] "@happylifeplat" "@Hengbo" "@heremaps"
[619] "@HIT" "@HKUST-Aerial-Robotics " "@homecredit"
[622] "@honeybadger8 " "@huawei" "@Huawei"
[625] "@HumanBible" "@hunterplus.net" "@huntlabs "
[628] "@hupun" "@hyperledger " "@Hypers "
[631] "@iangeli " "@IBM Research" "@iboxpay "
[634] "@IceBear-666 " "@iflytek" "@IHSVInc "
[637] "@ikang" "@InBuff " "@InfinityStudio & @LWL-Networks "
[640] "@insightfinder" "@ioootech " "@iost-official "
[643] "@iQIYI" "@irdeto" "@itagnjs "
[646] "@jcgroup" "@JDFinance" "@jianshucom "
[649] "@jike-engineering" "@JNUGeek " "@JoyMoe "
[652] "@JumeiRdGroup" "@Jusot " "@jutasky "
[655] "@JXUT-BST @RGB-TEC" "@k2data" "@kayac "
[658] "@keruyun " "@Kesci " "@kfw001 "
[661] "@knownsec" "@Kucoin " "@LambdaInnovation"
[664] "@LaurelHome " "@LearnSolid " "@lianjia-tech"
[667] "@LinkedIn" "@listen-now @SXUOSA @Sele-frontend " "@LiveLucid "
[670] "@lomocoin" "@lotusflare " "@LVMM-H5 "
[673] "@lvxunDev " "@lyft " "@maizuo & @sodalife "
[676] "@maodouio " "@maptalks " "@MapTalks "
[679] "@marklogic " "@McGill" "@MediaKind"
[682] "@MeetYouDevs" "@Meituan" "@Meituan-dianping, Inc"
[685] "@meituan.com" "@Meituan美团" "@meizu"
[688] "@Meowv" "@mercari" "@metrodata"
[691] "@MicroMOOC " "@microstrategy" "@mime-mob "
[694] "@mindbridge-ai" "@Miovision " "@mixi-inc "
[697] "@MoerFinance " "@mogu @opensec-cn " "@Monkee-Boy "
[700] "@moqi-ai @ansrlab " "@moregold " "@MPICP "
[703] "@MSRA" "@MSTechAnLi " "@multisolution "
[706] "@Muxi-Studio " "@mvc9" "@mycodon"
[709] "@MyScript" "@nactro" "@Naver China"
[712] "@ncuhome" "@NeToucher" "@NeusoftSEMI "
[715] "@NiceLabs " "@NJUPT" "@nlitt "
[718] "@NO" "@nodejs 学徒" "@nokia"
[721] "@nomadeducation " "@northdark " "@northeastern"
[724] "@NUAA-Open-Source " "@nuofe " "@nuxt-community"
[727] "@NVIDIA" "@NVIDIA " "@nxintech"
[730] "@NXT-FE " "@nytm " "@ojlm "
[733] "@OmenSec @Aurora-SEC " "@OpenNetworking " "@oracle"
[736] "@orzbox " "@osu-translate-zh" "@Our404 "
[739] "@OurEDA_Lab" "@ours8 " "@p1cn"
[742] "@p1cn " "@Paypal" "@pcit-ce "
[745] "@PDFE @GoliGoliTV " "@petropub " "@pinduoduo"
[748] "@PingPlusPlus " "@plaid" "@platformsh "
[751] "@pogon " "@polar-bears" "@Politiwatch, @PAblueshells, @PAcompsci, & others."
[754] "@ponyai " "@Power2U " "@PPCredit"
[757] "@ppdai" "@Primlo" "@pyspring"
[760] "@qbox " "@qiakr" "@qibancom "
[763] "@qihoo360" "@Qihoo360" "@qiniu"
[766] "@qiniu @qbox" "@qk365.com" "@quixey "
[769] "@qunar.com" "@RainMC " "@rancher "
[772] "@rancherlabs " "@React-Native-Team" "@realidfarm "
[775] "@Redhotminute " "@REDMedis " "@ringcentral "
[778] "@rishiqing " "@riversearch " "@rngame"
[781] "@rongzhilian" "@RootCluster" "@runtimeverification "
[784] "@RyanxJS " "@SafetyCulture" "@santaio"
[787] "@saubyte " "@sec-bit" "@segmentio "
[790] "@seuxw " "@Shapetrace " "@shedaltd "
[793] "@sheenCity" "@ShengQianKuaiBao" "@ShimoFour "
[796] "@Shinetechchina" "@ShinyFrog" "@ShirasagiMoe "
[799] "@Shopify" "@shuopensourcecommunity " "@shuquyun"
[802] "@SicunStudio " "@sildevTeam " "@sillybobo "
[805] "@SJTU" "@SJTU-SE " "@Skylark-Studio "
[808] "@skypool-org" "@Sofihub " "@Soochow University;@IQIYI"
[811] "@sprigs" "@St15IOT " "@star-mine Inc."
[814] "@starrycloud" "@Strikingly" "@sugar-libraries "
[817] "@superatoms " "@superoneio" "@superoneio "
[820] "@susers " "@SUSTC" "@synyi "
[823] "@SYSU-MSC-Studio @wechat-miniprogram" "@TALFE " "@Talkpal"
[826] "@tarsocial " "@tboox & @xmake-io " "@Team-Explorer-Rescue-Robot"
[829] "@team-explorer-rescue-robot " "@teambition" "@teamhola @nodejs "
[832] "@TEamSwifter " "@Tencent " "@Tencent @QSCTech"
[835] "@tensorspace-team " "@thalmic " "@The-Orizon @telegram-zhCN "
[838] "@thenetcircle " "@ThinkSpatial " "@thoughtworks "
[841] "@ThoughtWorks Inc" "@Thoughtworks.com" "@ThoughtWorksInc"
[844] "@ti-net " "@tigerbrokers " "@TINNO-Sugar "
[847] "@Tinwork, @LuluDansMaRue " "@TK" "@Tomorning"
[850] "@Tomorning " "@TPDT @luainkernel " "@trackingio "
[853] "@transferwise " "@Tubitv " "@tuhu "
[856] "@TUMCREATE" "@TuSimple" "@TuyaInc"
[859] "@twitchalerts " "@twitter" "@ucloud"
[862] "@UCloud" "@ucress " "@udesk "
[865] "@UESTC" "@ulb" "@Uniquestudio"
[868] "@UniqueStudio" "@UniqueStudio " "@UniqueStudio @HUSTFE "
[871] "@Unisound" "@university-of-york" "@UnknownStudio "
[874] "@Uplusware" "@USTC-Courses " "@ustclug "
[877] "@V2Git " "@VeniiRobot" "@verydog @cmdboys @sunflower-ui "
[880] "@viabtc @coinexcom" "@vipshop" "@vuese"
[883] "@wanmoe.cn" "@wasmerio" "@webeyemob"
[886] "@weicheche" "@weidian" "@WhatToEatAtNoonToday "
[889] "@White-Album-Lab" "@whmall.com" "@Wi-Q "
[892] "@Wikimedia | @WoCUG " "@Wiredcraft " "@Wish @ContextLogic"
[895] "@WoSai " "@wxmagic " "@XiangWuShuo"
[898] "@Xiaomi" "@XiDeHao" "@XLCW"
[901] "@XMatrixStudio " "@xtTech " "@xueersi"
[904] "@yaochi " "@YHJ-WEB " "@Yigang-SH "
[907] "@YNUOSA " "@young-studio " "@yuni-tech "
[910] "@yurenio " "@zaihui @vuejs" "@ZangaiFamily"
[913] "@zendesk " "@ZenMX " "@Zetyun"
[916] "@zhengruioi" "@zhihu " "@zhiqicloud "
[919] "@Zilliqa" "@ZJU-CC98 " "@ZJUT"
[922] "@zoho" "@zoom" "@zstackio"
[925] "@ZTO-Express " "@ZZES-ZCDC " "@zzus "
[928] "@众人安" "@即刻 @itsCoder " "@客如云"
[931] "@小米" "@巧房 @ReactTemplate @qtonecn @ReactChina" "@极客学院"
[934] "@比特大陆 Bitmain" "@瓜子二手车" "@结婚类网站"
[937] "@铭师堂 @有赞(前)" "*** co.LTD" "*************"
[940] "**************" "**信息科技" "**科技有限公司"
[943] "/university" "` `` `" "<img src='' onerror='alert(1)' />"
[946] "☺" "0" "0.0"
[949] "100offer" "1024.engineer" "1050629507@qq.com"
[952] "111" "111工作室" "115"
[955] "123木头人" "127.0.0.1" "1476102147@qq.com"
[958] "163" "163.com" "1771882991@qq.com"
[961] "1990" "1KE.CO" "2015 Computer Science at HHU"
[964] "209" "213" "21cn"
[967] "222" "234234234" "2345"
[970] "2345.com" "244180439@qq.com" "24好玩"
[973] "263,Inc." "3’s Company" "3vjia"
[976] "3yisu.com" "404." "5151515151"
[979] "51CTO" "51IDC Inc." "51job"
[982] "51NB" "58" "58 Group HRG"
[985] "58ganji" "58同城" "5th"
[988] "61koudai.com" "65370392" "6人游"
[991] "7" "7moor" "9air"
[994] "9fen" "A great company, very very big . " "A jewelry company"
[997] "Abakus" "ABC360" "ABChina"
[1000] "ABCI"
[ reached getOption("max.print") -- omitted 3137 entries ]
# Aggregating disparse companies.
company_info_agg <- company_info %>%
mutate(company_agg = company_aggregation(company))
the condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be usedthe condition has length > 1 and only the first element will be used